nohup python3 -m vllm.entrypoints.openai.api_server --port=8000 --model /home/test/models/Qwen3-32B    --served-model-name QwQ-32B --gpu-memory-utilization 0.90  --enable-auto-tool-choice --tool-call-parser hermes  --tensor-parallel-size 8   2>&1 | rotatelogs -f qwen3.log.%Y%m%d%H%M 100M &

